Languguage OS 2

home *** CD-ROM | disk | FTP | other *** search

/ Languguage OS 2 / Languguage OS II Version 10-94 (Knowledge Media)(1994).ISO / a_utils / decomp.lha / decomp / hier.c < prev next >

Wrap

C/C++ Source or Header | 1988-01-12 | 21KB | 924 lines

/* * Module: hier.c * * Author: J. Reuter * * This module converts a directed graph of basic blocks into * a tree of generic control constructs. It is based on the * Unix "struct" program (which is poorly commented, so this is * too). */ #include "defs.h" #include "nodes.h" #define CHILDNUM(v) (node_info[node_array[v]->node_type].num_children) struct hierarchy { int h_after; /* node numbers associated with after numbers*/ int h_ntobef; /* before numbers associated with nodes */ int h_ntoaft; /* after numbers associated with nodes */ int h_head; struct list *h_inarc; int h_dom; }; #define after(n) (h[n].h_after) #define ntobef(n) (h[n].h_ntobef) #define ntoaft(n) (h[n].h_ntoaft) #define head(n) (h[n].h_head) #define inarc(n) (h[n].h_inarc) #define dom(n) (h[n].h_dom) struct hierarchy *h; /* where we allocate the hierarchy structure */ struct list { int element; struct list *next_list; }; struct list *consls(); struct node *get_orif(); int access_count; /* number of nodes accessible from start */ static int exit_size = 0; /* threshold for loop inclusion of small exit code */ hier() { register int v; /* find back edges, unreachable nodes */ dfs(); /* sets head(v) to N_ITER heading smallest loop containing v or NONE */ gethead(); /* sets inarc(v) to list of forward arcs entering v */ getinarc(); /* sets dom(v) to immediate dominator of v or NONE */ getdom(); /* build the tree structure using head, inarc, dom */ gettree(); for (v = 0; v < node_count; v++) { freelst( inarc(v) ); inarc(v) = 0; } free( h ); } #define UNSEEN 0 #define STACKED 1 #define FINISHED 2 /* * depth-first search used to identify back edges, unreachable nodes; * each node v entered by back edge replaced by * N_LOOP ->N_ITER -> v, * so that back edges entering v now enter the N_ITER, * and other edges entering v now enter the N_LOOP. * Nodes are numbered according to depth-first search: * before numbering- ntobef(v) = i => node numbered v is i'th * node in order of first visit during the search; * after numbering- ntoaft(v) = i => node numbered v is i'th * node visited in order of last visit during the search. * Also, in this case after(i) = v. */ static int befcount, aftcount; /* following defines used to mark back edges and nodes entered by back edges */ #define mark(n) n->reach = 1; /* mark node n */ #define unmark(n) n->reach = 0; #define marked(n) (n->reach == 1) #define mark_edge(e) if ((e)>-1) (e) = -2-(e); /* mark edge e */ #define unmark_edge(e) if ((e)<-1) (e) = -2-(e); #define marked_edge(e) ((e) < -1) static dfs() /* depth first search */ { register int i; register int w; for ( w = 0; w < node_count; w++ ) { node_array[w]->node_scratch = UNSEEN; node_array[w]->reach = 0; /* use reach to count inarcs */ } if_inarcs( 0 ); for ( w = 0; w < node_count; w++ ) node_array[w]->node_scratch = UNSEEN; compound_if( 0 ); access_count = 0; for ( w = 0; w < node_count; w++ ) { node_array[w]->node_scratch = UNSEEN; unmark( node_array[w] ); } search( 0 ); unreach(); addloop(); h = (struct hierarchy *) malloc( node_max * sizeof( struct hierarchy ) ); if ( h == NULL ) { fprintf( stderr, "Out of memory\n" ); exit( 1 ); } for (i = 0; i < access_count; ++i) after(i) = NONE; for (w = 0; w < node_count; ++w) ntobef(w) = ntoaft(w) = NONE; befcount = 0; aftcount = 0; repsearch(0); } /* * compound_if converts complex branch logic into compound if statements. * Only N_ORIFs are generated here. Boolean logic will later convert * negated N_ORIFs into N_ANDIFs. * In addition, each N_CASE node is nested within a N_SWITCH node to * allow for proper nesting of case bodies and case labels are added. */ /* first count inarcs */ static if_inarcs( v ) register int v; { register struct node *n; register int i, adj; n = node_array[v]; n->node_scratch = STACKED; for ( i = 0; i < n->num_arcs; i++ ) { adj = n->arcs[i]; node_array[adj]->reach++; if ( node_array[adj]->node_scratch == UNSEEN ) if_inarcs( adj ); } n->node_scratch = FINISHED; } /* now collapse if's */ /* reach contains inarc count for node */ static compound_if( v ) register int v; { register int i; register int adj; register struct node *m, *n, *new; n = node_array[v]; n->node_scratch = STACKED; for ( i = 0; i < n->num_arcs; i++ ) { adj = n->arcs[i]; if ( node_array[adj]->node_scratch == UNSEEN ) compound_if( adj ); } if ( n->node_type == N_IF || n->node_type == N_ORIF ) { m = node_array[ n->arcs[THEN_ARC] ]; if ( ( m->node_type == N_IF || m->node_type == N_ORIF ) && m->node_scratch == FINISHED && m->reach == 1 ) if ( m->arcs[THEN_ARC] == n->arcs[ELSE_ARC] ) { new = get_orif( v, TRUE, n->arcs[THEN_ARC], FALSE, n->arcs[ELSE_ARC], m->arcs[ELSE_ARC] ); i = m->arcs[THEN_ARC]; new->reach = n->reach; m->arcs[THEN_ARC] = NONE; m->arcs[ELSE_ARC] = NONE; n->arcs[THEN_ARC] = NONE; n->arcs[ELSE_ARC] = NONE; node_array[v] = new; node_array[node_count - 1] = n; node_array[i]->reach--; compound_if( v ); goto skip_else; } else if ( m->arcs[ELSE_ARC] == n->arcs[ELSE_ARC] ) { new = get_orif( v, TRUE, n->arcs[THEN_ARC], TRUE, n->arcs[ELSE_ARC], m->arcs[THEN_ARC] ); i = m->arcs[ELSE_ARC]; new->reach = n->reach; m->arcs[THEN_ARC] = NONE; m->arcs[ELSE_ARC] = NONE; n->arcs[THEN_ARC] = NONE; n->arcs[ELSE_ARC] = NONE; node_array[v] = new; node_array[node_count - 1] = n; node_array[i]->reach--; compound_if( v ); goto skip_else; } m = node_array[ n->arcs[ELSE_ARC] ]; if ( ( m->node_type == N_IF || m->node_type == N_ORIF ) && m->node_scratch == FINISHED && m->reach == 1 ) if ( m->arcs[THEN_ARC] == n->arcs[THEN_ARC] ) { new = get_orif( v, FALSE, n->arcs[ELSE_ARC], FALSE, n->arcs[THEN_ARC], m->arcs[ELSE_ARC] ); i = m->arcs[THEN_ARC]; new->reach = n->reach; m->arcs[THEN_ARC] = NONE; m->arcs[ELSE_ARC] = NONE; n->arcs[THEN_ARC] = NONE; n->arcs[ELSE_ARC] = NONE; node_array[v] = new; node_array[node_count - 1] = n; node_array[i]->reach--; compound_if( v ); } else if ( m->arcs[ELSE_ARC] == n->arcs[THEN_ARC] ) { new = get_orif( v, FALSE, n->arcs[ELSE_ARC], TRUE, n->arcs[THEN_ARC], m->arcs[THEN_ARC] ); i = m->arcs[ELSE_ARC]; new->reach = n->reach; m->arcs[THEN_ARC] = NONE; m->arcs[ELSE_ARC] = NONE; n->arcs[THEN_ARC] = NONE; n->arcs[ELSE_ARC] = NONE; node_array[v] = new; node_array[node_count - 1] = n; node_array[i]->reach--; compound_if( v ); } } else if ( n->node_type == N_CASE ) { /* add a N_SWITCH node for proper case stmt nesting */ if ( node_count + n->num_arcs > node_max ) node_grow(); new = get_node( 2 ); new->node_type = N_SWITCH; new->start_address = n->start_address; new->end_address = n->end_address; new->num_arcs = 2; new->arcs[0] = n->arcs[0]; /* case exit */ new->arcs[1] = node_count - 1; /* case stmt. */ node_array[node_count - 1] = n; node_array[v] = new; /* and add some case labels */ for ( i = 1; i < n->num_arcs; i++ ) { new = get_node( 1 ); new->node_type = N_CASELAB; new->num_arcs = 1; new->arcs[0] = n->arcs[i]; n->arcs[i] = node_count - 1; new->varpart[V_CASESLOT] = i - 1 + n->varpart[V_BASE]; node_array[node_count - 1] = new; } } skip_else: node_array[v]->node_scratch = FINISHED; } static struct node * get_orif( a_pred, a_negate, b_pred, b_negate, then_arc, else_arc ) int a_pred; int a_negate; int b_pred; int b_negate; int then_arc; int else_arc; { register struct node *n; if ( node_count + 1 > node_max ) node_grow(); n = get_node( 2 ); n->node_type = N_ORIF; n->num_arcs = 2; n->arcs[THEN_ARC] = then_arc; n->arcs[ELSE_ARC] = else_arc; n->varpart[V_NEGATE] = FALSE; n->varpart[V_PRED1] = node_count - 1; /* this will be a_pred */ if ( a_negate ) node_array[a_pred]->varpart[V_NEGATE] = ! node_array[a_pred]->varpart[V_NEGATE]; n->varpart[V_PRED2] = b_pred; if ( b_negate ) node_array[b_pred]->varpart[V_NEGATE] = ! node_array[b_pred]->varpart[V_NEGATE]; return n; } /* * using depth first search, mark back edges using mark_edge, * and nodes entered by back edges using MARK */ static search( v ) register int v; { register int adj; register int i; register struct node *n; n = node_array[v]; n->node_scratch = STACKED; for (i = 0; i < n->num_arcs; i++) { adj = n->arcs[i]; if ( node_array[adj]->node_scratch == UNSEEN ) search( adj ); else if ( node_array[adj]->node_scratch == STACKED ) { /* mark adj node as entered by back edge */ mark( node_array[adj] ); /* mark edge as being back edge */ mark_edge( n->arcs[i] ); } } n->node_scratch = FINISHED; access_count += 1; } /* * mark unreachable nodes. Don't change N_IF nodes if they are * unreachable--we need the type information later. */ static unreach() { int v; for ( v = 0; v < node_count; v++ ) if ( node_array[v]->node_scratch == UNSEEN && node_array[v]->node_type != N_IF && node_array[v]->node_type != N_ORIF ) node_array[v]->node_type = N_UNREACH; } /* add N_LOOP, N_ITER at nodes entered by back edges, and adjust edges */ addloop() { register int v; register int adj; register int j; register int oldnum; register struct node *n, *loop, *iter; /* insloop increases node_count */ for (v = 0, oldnum = node_count; v < oldnum; ++v) { n = node_array[v]; if ( marked(n) ) { /* remove mark indicating v entered by back edge */ unmark(n); if ( node_count + 2 >= node_max ) node_grow(); /* add N_LOOP, N_ITER since v entered by back edge*/ loop = get_node( 1 ); loop->node_type = N_LOOP; loop->num_arcs = 1; iter = get_node( 1 ); iter->node_type = N_ITER; iter->num_arcs = 1; access_count += 2; /* want N_LOOP to take on node number v, so that arcs other than back arcs entering v will enter N_LOOP */ node_array[v] = loop; node_array[node_count-2] = iter; node_array[node_count-1] = n; loop->arcs[0] = node_count - 2; iter->arcs[0] = node_count - 1; iter->varpart[V_FATHER] = v; } } /* arcs which used to enter v now enter N_LOOP; * must make back edges enter N_ITER */ for (v = 0; v < node_count; ++v) for ( j = 0; j < node_array[v]->num_arcs; ++j ) { if ( marked_edge( node_array[v]->arcs[j] ) ) { unmark_edge( node_array[v]->arcs[j] ); adj = node_array[v]->arcs[j]; if ( node_array[adj]->node_type != N_ITER ) /* change arc to point to N_ITER */ node_array[v]->arcs[j] = node_array[adj]->arcs[0]; } } } /* repeat df search in order to fill in after, ntoaft, ntobef tables */ static repsearch(v) register int v; { register int adj; register int i, temp; ntobef(v) = befcount; befcount++; for ( i = 0; i < node_array[v]->num_arcs; i++ ) { adj = node_array[v]->arcs[i]; if ( ntobef(adj) == NONE ) repsearch( adj ); } aftcount++; temp = access_count - aftcount; after(temp) = v; ntoaft(v) = temp; } /* define ANC(v,w) true if v == w or v is ancestor of w (reflexive ancestor) */ #define ANC(v,w) ( ntobef(v) <= ntobef(w) && ntoaft(v) <= ntoaft(w) ) /* * set head(v) to N_ITER heading smallest loop containing v, for each v */ /* * Search nodes in reverse of after numbering so that all paths from * a node to an ancestor are searched before the node. * * At any point, the current value of head allows chains of nodes * to be reached from any node v by taking head(v), head(head(v)), etc. * until an NONE value is reached. Upon searching each arc, * the appropriate chains must be merged to avoid losing information. * * For example, from one path out of a node v it may be known that * v is in a loop headed by z, while from another * it may be known that v is in a loop headed by w. * Thus, head(v) must be set to whichever of z,w is the closer ancestor, * and the fact that this node is in a loop headed by the other must be * recorded in head. */ static gethead() { register int v, w, adj; register int i, j; for (v = 0; v < node_count; ++v) head(v) = NONE; for (i = access_count -1; i >= 0; i--) { v = after(i); for (j = 0; j < node_array[v]->num_arcs; ++j) { adj = node_array[v]->arcs[j]; if ( ntoaft(adj) < i ) /* back edge */ merge( v, adj ); else if ( ANC(v, adj) ) { /* not back edge or cross edge */ /* * need to do only tree edges - must not do edge (v,adj) * when head(adj) is not ANC of v */ if ( DEFINED(head(adj)) && ANC(head(adj),v) ) merge( v, head(adj) ); } else { /* cross edge */ w = lowanc( adj, v ); if ( DEFINED(w) ) merge( w, v ); } } if ( node_array[v]->node_type == N_LOOP ) /* head of N_ITER must be different N_ITER */ head(node_array[v]->arcs[0]) = head(v); } } /* find the first node in chain of y which is anc of z, if it exists */ static int lowanc( y, z ) register int y, z; { while ( y != -1 && !ANC(y,z) ) y = head(y); return y; } /* merge chains of w and y according to ANC relation */ static merge( w, y ) int w, y; { int t, min; if ( w == y ) return; if ( ANC(w,y) ) { /* set t to min of w,y */ t = y; y = head(y); } else { t = w; w = head(w); } /* construct chain at t by adding min of remaining elements */ while (w != -1 && y != -1) { if ( ANC(w,y) ) { min = y; y = head(y); } else { min = w; w = head(w); } if ( t != min ) { head(t) = min; t = min; } } if ( w == -1 ) min = y; else min = w; if ( t != min ) head(t) = min; } /* * find forward in-arcs for each node, pretending that arcs which jump * into a loop jump to the head of the largest such loop instead, based * on the depth first search tree */ /* construct array "inarc" containing in arcs for each node */ static getinarc() { register int v, adj, x; register int i, j; for (v=0; v < node_count; v++) inarc(v) = 0; /* fill in inarc nodes */ for (i = 0; i < access_count; ++i) { v = after(i); for (j = 0; j < node_array[v]->num_arcs; ++j) { adj = node_array[v]->arcs[j]; /* not a back edge */ /* if edge jumps into loop, pretend jumps to head of largest loop jumped into */ if ( ntoaft(adj) > ntoaft(v) ) { x = maxentry( v, adj ); if ( !DEFINED(x) ) x = adj; else x = node_array[x]->varpart[V_FATHER]; /* insert v in list inarc[x] */ inarc(x) = consls( v, inarc(x) ); } } } } /* return z if z is N_ITER of largest loop containing y but not x, NONE otherwise */ static int maxentry( x, y ) int x, y; { if ( head(y) == NONE ) return(NONE); if ( loomem( x, head(y) ) ) return (NONE); y = head(y); while ( head(y) != NONE ) { if ( loomem( x, head(y) ) ) return(y); y = head(y); } return(y); } /* return TRUE if x is in loop headed by y, FALSE otherwise */ static int loomem( x, y ) register int x, y; { register int w; if ( !DEFINED(y) ) return TRUE; w = (node_array[x]->node_type == N_ITER) ? x : head(x); for ( ; DEFINED(w); w = head(w) ) if ( w == y ) return TRUE; return FALSE; } /* * set dom(v) to immediate dominator of v, based on arcs as stored in inarcs * (i.e. pretending the graph is reducible if it isn't). * Algorithm is from Hecht and Ullman, Analysis of a simple algorithm for * global flow analysis problems, except bit vector operations replaced by * search through DOM to save quadratic blowup in space */ static getdom() { register int v; register int i; register struct list *ls; for (v = 0; v < node_count; ++v) dom(v) = NONE; for (i = 1; i < access_count; ++i) { v = after(i); for (ls = inarc(v); ls; ls = ls->next_list) { dom(v) = comdom( dom(v), ls->element ); } } } /* find closest common dominator of u,v */ static int comdom( u, v ) register int u, v; { if (u == NONE) return(v); if (v == NONE) return(u); while(u != v) { if (ntoaft(u) < ntoaft(v)) v = dom(v); else u = dom(u); } return(u); } /* * use inarc, dom, and head to build tree representing structure of program. * Each node v has children denoted by * node_array[v]->child[0], node_array[v]->child[1], ... * representing code nested within v * * node_array[v]->right_sibling is right sibling of v or NONE, * and represents code following v at the same level of nesting, */ /* build tree */ static gettree() { register int v, u, from; register int i; register int found; register struct node *from_node; for ( v = 0; v < node_count; ++v ) { node_array[v]->right_sibling = NONE; for ( i = 0; i < CHILDNUM(v); ++i ) node_array[v]->child[i] = NONE; } for (i = access_count-1; i > 0; --i) { v = after(i); found = FALSE; /* the unique element of inarc(v) or NONE */ from = one_element( inarc(v) ); if ( DEFINED(from) ) { from_node = node_array[from]; if ( ( from_node->node_type == N_BRANCH || from_node->node_type == N_IF || from_node->node_type == N_ORIF ) && ( head(v) == head(from) || asoc( v, exit_size ) != -1 ) ) { /* * place in clause of N_BRANCH, N_[OR]IF if in smallest loop * containing it or if size of code for v is <= exit_size */ if ( from_node->arcs[THEN_ARC] == v ) { from_node->child[THEN_ARC] = v; found = TRUE; } else { from_node->child[ELSE_ARC] = v; found = TRUE; } } else if ( node_array[v]->node_type == N_ITER || from_node->node_type == N_ITER ) { /* N_LOOP -> N_ITER -> BODY always in same loop */ from_node->child[0] = v; found = TRUE; } else if ( node_array[from]->node_type == N_SWITCH ) { if ( from_node->arcs[1] == v ) { from_node->child[0] = v; found = TRUE; } } } if ( found ) continue; if ( loomem( v, head(dom(v)) ) ) { /* v is in smallest loop containing dom(v) */ insib( dom(v), v ); } else { /* * make v follow N_LOOP heading largest loop * containing dom(v) but not v */ for ( u = head(dom(v)); head(u) != head(v); u = head(u) ) ; insib( node_array[u]->varpart[V_FATHER], v ); } } } /* * make right_sibling[w] = v, and make * right_sibling[ rightmost sibling of v ] = previous right_sibling[w] */ static insib( w, v ) register int w, v; { register int u, temp; temp = node_array[w]->right_sibling; node_array[w]->right_sibling = v; for ( u = v; DEFINED(node_array[u]->right_sibling); u = node_array[u]->right_sibling ) ; node_array[u]->right_sibling = temp; } /* return # of nodes associated with v if <= n, -1 otherwise */ static asoc( v, n ) register int v; register int n; { register int count, i, temp; register int w; i = node_array[v]->node_type; if ( i == N_FLOW || i == N_IF || i == N_BRANCH || i == N_SWITCH || i == N_END ) count = node_array[v]->end_address - node_array[v]->start_address; else count = 1; for ( i = 0; i < CHILDNUM(v); ++i ) { w = node_array[v]->child[i]; if ( !DEFINED(w) ) continue; temp = asoc( w, n-count ); if ( temp == -1 ) return -1; count += temp; if ( count > n ) return -1; } if ( DEFINED(node_array[v]->right_sibling) ) { temp = asoc( node_array[v]->right_sibling, n - count ); if ( temp == -1 ) return -1; count += temp; } if ( count > n ) return -1; else return count; } /* * list manipulation functions */ /* make a list, insert it in front of ls */ static struct list * consls( v, ls ) register int v; register struct list *ls; { register struct list *temp; temp = (struct list *) malloc( sizeof(struct list) ); temp->element = v; temp->next_list = ls; return temp; } /* free a list */ static freelst( ls ) register struct list *ls; { if ( ls == NULL ) return; if ( ls->next_list != NULL ) freelst( ls->next_list ); free( ls ); } /* return element only if it is only element in list */ static int one_element( ls ) register struct list *ls; { if ( ls == NULL ) return NONE; if ( ls->next_list ) return NONE; return ls->element; }